unset NCCL_QUADRUPLE_CHANNELS
#export CUDA_VISIBLE_DEVICES=4,5,1,0,9,8,12,13,7,6,2,3,10,11,15,14
#export CUDA_VISIBLE_DEVICES=4,5,7,6,0,1,3,2,9,8,10,11,13,12,14,15
# export CUDA_VISIBLE_DEVICES=4,7,5,6,1,2,0,3,12,15,13,14,9,10,8,11
# export NCCL_SOCKET_IFNAME=eth0
#export MP_VP=2
sh run_mcore_qwen-no-overlap.sh  \
dsw  \
0.5B   \
1    \
256 \
1e-5   \
1e-6   \
4096  \
4096  \
bf16  \
1  \
1 \
1 \
true \
true   \
true \
false \
false   \
false \
100000  \
/mnt/workspace/guosj/qwen-datasets/wudao_qwenbpe_text_document  \
/mnt/workspace/guosj/qwen-datasets/wudao_qwenbpe_text_document  \
/mnt/workspace/guosj/qwen-ckpts  \
10000000000  \
100  \
/mnt/workspace/guosj/output_mcore_qwen2.5_pretrain